#!/anaconda3/bin/python
#-*- coding:utf-8 -*-

#CrawUnivRankingA.py
import sys
import requests
from bs4 import BeautifulSoup
import bs4


def getHTMLText(url):
    try:
        r = requests.get(url, timeout=30)
        r.raise_for_status()
        r.encoding = r.apparent_encoding
        return r.text
    except:
        return ""


def fillUnivList(ulist, html):
    soup = BeautifulSoup(html, "html.parser")
    for tr in soup.find('tbody').children:
        if isinstance(tr, bs4.element.Tag):
            tds = tr('td')
            ulist.append(
                [tds[0].string, tds[1].string, tds[3].string, tds[2].string])


def printUnivList(ulist, num):
    print("{:^10}\t{:^16}\t{:^10}\t{:^10}".format("排名", "学校名称", "总分", "地区"))
    for i in range(num):
        u = ulist[i]
        print("{:^10}\t{:^16}\t{:^10}\t{:^10}".format(u[0], u[1], u[2], u[3]))


def main():
    uinfo = []
    url = 'http://www.zuihaodaxue.cn/zuihaodaxuepaiming2018.html'
    html = getHTMLText(url)
    fillUnivList(uinfo, html)
    printUnivList(uinfo, 100)  # 20 univs


if __name__ == '__main__':
    main()
